This file was created with JabRef 1.8b2.
Encoding: ISO8859_1

@PHDTHESIS{LITTMAN,
  author = {Michael Lederman Littman},
  title = {Algorithms for Sequential Decision Making},
  school = {Brown University},
  year = {1996},
}

@BOOK{SUTTON,
  title = {Reinforcement Learning: An Introduction},
  publisher = {Cambridge, Massachusetts, The MIT Press},
  year = {1998},
  author = {Richard S. Sutton and Andrew G. Barto},
}

@PHDTHESIS{WATKINS,
  author = {C. J. C. H. Watkins},
  title = {Learning from Delayed Rewards},
  school = {Cambridge University},
  year = {1989},
}

@ARTICLE{QLEARN,
  author = {C. J. C. H. Watkins and P. Dayan},
  title = {Technical Note: Q-Learning},
  journal = {Machine Learning},
  year = {1992},
  volume = {8},
  pages = {279 - 292},
  number = {3-4},
  month = {May},
}

